 % !Mode:: "TeX:UTF-8"
 
 @article{kuppusamy2021convolutional,
 	title={Convolutional and Deep Neural Networks based techniques for extracting the age-relevant features of the speaker},
 	author={Kuppusamy, Karthika and Eswaran, Chandra},
 	journal={Journal of Ambient Intelligence and Humanized Computing},
 	pages={1--13},
 	year={2021},
 	publisher={Springer}
 }

@article{kersta1962voiceprint,
	title={Voiceprint identification},
	author={Kersta, Lawrence George},
	journal={The Journal of the Acoustical Society of America},
	volume={34},
	number={5},
	pages={725--725},
	year={1962},
	publisher={Acoustical Society of America}
}

@article{atal1974effectiveness,
	title={Effectiveness of linear prediction characteristics of the speech wave for automatic speaker identification and verification},
	author={Atal, Bishnu S},
	journal={the Journal of the Acoustical Society of America},
	volume={55},
	number={6},
	pages={1304--1312},
	year={1974},
	publisher={Acoustical Society of America}
}

@misc{doddington1992method,
	title={Method for utilizing formant frequencies in speech recognition},
	author={Doddington, George R and Chen, Yeunung and Leonard, R Gary},
	year={1992},
	month=sep # "~8",
	publisher={Google Patents},
	note={US Patent 5,146,539}
}

@article{atal1976automatic,
	title={Automatic recognition of speakers from their voices},
	author={Atal, Bishnu S},
	journal={Proceedings of the IEEE},
	volume={64},
	number={4},
	pages={460--475},
	year={1976},
	publisher={IEEE}
}

@article{davis1980comparison,
	title={Comparison of parametric representations for monosyllabic word recognition in continuously spoken sentences},
	author={Davis, Steven and Mermelstein, Paul},
	journal={IEEE transactions on acoustics, speech, and signal processing},
	volume={28},
	number={4},
	pages={357--366},
	year={1980},
	publisher={IEEE}
}

@article{sakoe1978dynamic,
	title={Dynamic programming algorithm optimization for spoken word recognition},
	author={Sakoe, Hiroaki and Chiba, Seibi},
	journal={IEEE transactions on acoustics, speech, and signal processing},
	volume={26},
	number={1},
	pages={43--49},
	year={1978},
	publisher={IEEE}
}

@inproceedings{mishra2012vector,
	title={A vector quantization approach to speaker recognition},
	author={Mishra, Poonam},
	booktitle={Proceedings of International Conference on Innovation \& Research in Technology for Sustainable Development},
	pages={152--155},
	year={2012}
}

@inproceedings{rosenberg1990sub,
	title={Sub-word unit talker verification using hidden Markov models},
	author={Rosenberg, Aaron E and Lee, C-H and Soong, Frank K},
	booktitle={International Conference on Acoustics, Speech, and Signal Processing},
	pages={269--272},
	year={1990},
	organization={IEEE}
}

@article{farrell1994speaker,
	title={Speaker recognition using neural networks and conventional classifiers},
	author={Farrell, Kevin R and Mammone, Richard J and Assaleh, Khaled T},
	journal={IEEE Transactions on speech and audio processing},
	volume={2},
	number={1},
	pages={194--205},
	year={1994},
	publisher={IEEE}
}

@article{reynolds1995speaker,
	title={Speaker identification and verification using Gaussian mixture speaker models},
	author={Reynolds, Douglas A},
	journal={Speech communication},
	volume={17},
	number={1-2},
	pages={91--108},
	year={1995},
	publisher={Elsevier}
}

@article{reynolds2000speaker,
	title={Speaker verification using adapted Gaussian mixture models},
	author={Reynolds, Douglas A and Quatieri, Thomas F and Dunn, Robert B},
	journal={Digital signal processing},
	volume={10},
	number={1-3},
	pages={19--41},
	year={2000},
	publisher={Elsevier}
}

@article{kenny2005eigenvoice,
	title={Eigenvoice modeling with sparse training data},
	author={Kenny, Patrick and Boulianne, Gilles and Dumouchel, Pierre},
	journal={IEEE transactions on speech and audio processing},
	volume={13},
	number={3},
	pages={345--354},
	year={2005},
	publisher={IEEE}
}

@article{kenny2005joint,
	title={Joint factor analysis of speaker and session variability: Theory and algorithms},
	author={Kenny, Patrick},
	journal={CRIM, Montreal,(Report) CRIM-06/08-13},
	volume={14},
	pages={28--29},
	year={2005}
}

@inproceedings{vogt2005modelling,
	title={Modelling session variability in text-independent speaker verification},
	author={Vogt, Robert and Baker, Brendan and Sridharan, Subramanian},
	booktitle={Eurospeech/Interspeech: Proceedings of the 9th European Conference on Speech Communication and Technology 2005},
	pages={3117--3120},
	year={2005},
	organization={Institut fur Kommunikationsforschung und Ponetik (ISCA), Universitat Bonn}
}

@article{dehak2010front,
	title={Front-end factor analysis for speaker verification},
	author={Dehak, Najim and Kenny, Patrick J and Dehak, R{\'e}da and Dumouchel, Pierre and Ouellet, Pierre},
	journal={IEEE Transactions on Audio, Speech, and Language Processing},
	volume={19},
	number={4},
	pages={788--798},
	year={2010},
	publisher={IEEE}
}

@inproceedings{long2008sipca,
	title={An SIPCA-WCCN method for SVM-based speaker verification system},
	author={Long, Yanhua and Guo, Wu and Dai, Lirong},
	booktitle={2008 International Conference on Audio, Language and Image Processing},
	pages={1295--1299},
	year={2008},
	organization={IEEE}
}

@inproceedings{solomonoff2005advances,
	title={Advances in channel compensation for SVM speaker recognition},
	author={Solomonoff, Alex and Campbell, William M and Boardman, Ian},
	booktitle={Proceedings.(ICASSP'05). IEEE International Conference on Acoustics, Speech, and Signal Processing, 2005.},
	volume={1},
	pages={I--629},
	year={2005},
	organization={IEEE}
}

@article{mclaren2011source,
	title={Source-normalized LDA for robust speaker recognition using i-vectors from multiple speech sources},
	author={McLaren, Mitchell and Van Leeuwen, David},
	journal={IEEE Transactions on Audio, Speech, and Language Processing},
	volume={20},
	number={3},
	pages={755--766},
	year={2011},
	publisher={IEEE}
}

@inproceedings{prince2007probabilistic,
	title={Probabilistic linear discriminant analysis for inferences about identity},
	author={Prince, Simon JD and Elder, James H},
	booktitle={2007 IEEE 11th International Conference on Computer Vision},
	pages={1--8},
	year={2007},
	organization={IEEE}
}

@article{hinton2006fast,
	title={A fast learning algorithm for deep belief nets},
	author={Hinton, Geoffrey E and Osindero, Simon and Teh, Yee-Whye},
	journal={Neural computation},
	volume={18},
	number={7},
	pages={1527--1554},
	year={2006},
	publisher={MIT Press}
}

@inproceedings{lei2014novel,
	title={A novel scheme for speaker recognition using a phonetically-aware deep neural network},
	author={Lei, Yun and Scheffer, Nicolas and Ferrer, Luciana and McLaren, Mitchell},
	booktitle={2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
	pages={1695--1699},
	year={2014},
	organization={IEEE}
}

@inproceedings{kenny2014deep,
	title={Deep Neural Networks for extracting Baum-Welch statistics for Speaker Recognition.},
	author={Kenny, Patrick and Stafylakis, Themos and Ouellet, Pierre and Gupta, Vishwa and Alam, Md Jahangir},
	booktitle={Odyssey},
	volume={2014},
	pages={293--298},
	year={2014}
}

@inproceedings{heigold2016end,
	title={End-to-end text-dependent speaker verification},
	author={Heigold, Georg and Moreno, Ignacio and Bengio, Samy and Shazeer, Noam},
	booktitle={2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
	pages={5115--5119},
	year={2016},
	organization={IEEE}
}

@inproceedings{snyder2017deep,
	title={Deep Neural Network Embeddings for Text-Independent Speaker Verification.},
	author={Snyder, David and Garcia-Romero, Daniel and Povey, Daniel and Khudanpur, Sanjeev},
	booktitle={Interspeech},
	pages={999--1003},
	year={2017}
}

@article{li2017deep,
	title={Deep speaker: an end-to-end neural speaker embedding system},
	author={Li, Chao and Ma, Xiaokong and Jiang, Bing and Li, Xiangang and Zhang, Xuewei and Liu, Xiao and Cao, Ying and Kannan, Ajay and Zhu, Zhenyao},
	journal={arXiv preprint arXiv:1705.02304},
	volume={650},
	year={2017}
}

@article{dahl2011context,
	title={Context-dependent pre-trained deep neural networks for large-vocabulary speech recognition},
	author={Dahl, George E and Yu, Dong and Deng, Li and Acero, Alex},
	journal={IEEE Transactions on audio, speech, and language processing},
	volume={20},
	number={1},
	pages={30--42},
	year={2011},
	publisher={IEEE}
}

@article{sak2014long,
	title={Long short-term memory recurrent neural network architectures for large scale acoustic modeling},
	author={Sak, Hasim and Senior, Andrew W and Beaufays, Fran{\c{c}}oise},
	year={2014}
}

@inproceedings{variani2014deep,
	title={Deep neural networks for small footprint text-dependent speaker verification},
	author={Variani, Ehsan and Lei, Xin and McDermott, Erik and Moreno, Ignacio Lopez and Gonzalez-Dominguez, Javier},
	booktitle={2014 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
	pages={4052--4056},
	year={2014},
	organization={IEEE}
}

@article{nagrani2017voxceleb,
	title={Voxceleb: a large-scale speaker identification dataset},
	author={Nagrani, Arsha and Chung, Joon Son and Zisserman, Andrew},
	journal={arXiv preprint arXiv:1706.08612},
	year={2017}
}

@inproceedings{ko2017study,
	title={A study on data augmentation of reverberant speech for robust speech recognition},
	author={Ko, Tom and Peddinti, Vijayaditya and Povey, Daniel and Seltzer, Michael L and Khudanpur, Sanjeev},
	booktitle={2017 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
	pages={5220--5224},
	year={2017},
	organization={IEEE}
}

@article{snyder2015musan,
	title={Musan: A music, speech, and noise corpus},
	author={Snyder, David and Chen, Guoguo and Povey, Daniel},
	journal={arXiv preprint arXiv:1510.08484},
	year={2015}
}

@article{waibel1989phoneme,
	title={Phoneme recognition using time-delay neural networks},
	author={Waibel, Alex and Hanazawa, Toshiyuki and Hinton, Geoffrey and Shikano, Kiyohiro and Lang, Kevin J},
	journal={IEEE transactions on acoustics, speech, and signal processing},
	volume={37},
	number={3},
	pages={328--339},
	year={1989},
	publisher={IEEE}
}

@inproceedings{peddinti2015time,
	title={A time delay neural network architecture for efficient modeling of long temporal contexts},
	author={Peddinti, Vijayaditya and Povey, Daniel and Khudanpur, Sanjeev},
	booktitle={Sixteenth Annual Conference of the International Speech Communication Association},
	year={2015}
}

@inproceedings{snyder2015time,
	title={Time delay deep neural network-based universal background models for speaker recognition},
	author={Snyder, David and Garcia-Romero, Daniel and Povey, Daniel},
	booktitle={2015 IEEE Workshop on Automatic Speech Recognition and Understanding (ASRU)},
	pages={92--97},
	year={2015},
	organization={IEEE}
}

@inproceedings{snyder2018x,
	title={X-vectors: Robust dnn embeddings for speaker recognition},
	author={Snyder, David and Garcia-Romero, Daniel and Sell, Gregory and Povey, Daniel and Khudanpur, Sanjeev},
	booktitle={2018 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)},
	pages={5329--5333},
	year={2018},
	organization={IEEE}
}

@article{lecun1995convolutional,
	title={Convolutional networks for images, speech, and time series},
	author={LeCun, Yann and Bengio, Yoshua and others},
	journal={The handbook of brain theory and neural networks},
	volume={3361},
	number={10},
	pages={1995},
	year={1995}
}

@inproceedings{abdel2012applying,
	title={Applying convolutional neural networks concepts to hybrid NN-HMM model for speech recognition},
	author={Abdel-Hamid, Ossama and Mohamed, Abdel-rahman and Jiang, Hui and Penn, Gerald},
	booktitle={2012 IEEE international conference on Acoustics, speech and signal processing (ICASSP)},
	pages={4277--4280},
	year={2012},
	organization={IEEE}
}

@inproceedings{he2016deep,
	title={Deep residual learning for image recognition},
	author={He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
	booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
	pages={770--778},
	year={2016}
}

@inproceedings{hu2018squeeze,
	title={Squeeze-and-excitation networks},
	author={Hu, Jie and Shen, Li and Sun, Gang},
	booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
	pages={7132--7141},
	year={2018}
}

@inproceedings{liu2017sphereface,
	title={Sphereface: Deep hypersphere embedding for face recognition},
	author={Liu, Weiyang and Wen, Yandong and Yu, Zhiding and Li, Ming and Raj, Bhiksha and Song, Le},
	booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
	pages={212--220},
	year={2017}
}

@article{wang2018additive,
	title={Additive margin softmax for face verification},
	author={Wang, Feng and Cheng, Jian and Liu, Weiyang and Liu, Haijun},
	journal={IEEE Signal Processing Letters},
	volume={25},
	number={7},
	pages={926--930},
	year={2018},
	publisher={IEEE}
}

@inproceedings{wang2018cosface,
	title={Cosface: Large margin cosine loss for deep face recognition},
	author={Wang, Hao and Wang, Yitong and Zhou, Zheng and Ji, Xing and Gong, Dihong and Zhou, Jingchao and Li, Zhifeng and Liu, Wei},
	booktitle={Proceedings of the IEEE conference on computer vision and pattern recognition},
	pages={5265--5274},
	year={2018}
}

@inproceedings{deng2019arcface,
	title={Arcface: Additive angular margin loss for deep face recognition},
	author={Deng, Jiankang and Guo, Jia and Xue, Niannan and Zafeiriou, Stefanos},
	booktitle={Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition},
	pages={4690--4699},
	year={2019}
}